@inproceedings{hu2021unit,
  title={Unit: Multimodal multitask learning with a unified transformer},
  author={Hu, Ronghang and Singh, Amanpreet},
  booktitle={Proceedings of the IEEE/CVF International Conference on Computer Vision},
  pages={1439--1449},
  year={2021}
}